See corpora on Wiktionary
{
"head_templates": [
{
"args": {
"1": "en",
"2": "noun form"
},
"expansion": "corpora",
"name": "head"
}
],
"lang": "English",
"lang_code": "en",
"pos": "noun",
"senses": [
{
"categories": [
{
"kind": "other",
"name": "English entries with incorrect language header",
"parents": [],
"source": "w"
},
{
"kind": "other",
"name": "English plurals in -ra with singular in -s",
"parents": [],
"source": "w"
},
{
"kind": "other",
"name": "Pages with 4 entries",
"parents": [],
"source": "w"
},
{
"kind": "other",
"name": "Pages with entries",
"parents": [],
"source": "w"
}
],
"form_of": [
{
"word": "corpus"
}
],
"glosses": [
"plural of corpus"
],
"id": "en-corpora-en-noun-BvqyzxlP",
"links": [
[
"corpus",
"corpus#English"
]
],
"tags": [
"form-of",
"plural"
]
}
],
"sounds": [
{
"ipa": "/ˈkɔːpəɹə/",
"tags": [
"Received-Pronunciation"
]
},
{
"audio": "LL-Q1860 (eng)-Vealhurl-corpora.wav",
"mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/d/dd/LL-Q1860_%28eng%29-Vealhurl-corpora.wav/LL-Q1860_%28eng%29-Vealhurl-corpora.wav.mp3",
"ogg_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/d/dd/LL-Q1860_%28eng%29-Vealhurl-corpora.wav/LL-Q1860_%28eng%29-Vealhurl-corpora.wav.ogg"
},
{
"ipa": "/ˈkɔɹpəɹə/",
"tags": [
"General-American"
]
}
],
"word": "corpora"
}
{
"head_templates": [
{
"args": {
"1": "nl",
"2": "noun form"
},
"expansion": "corpora",
"name": "head"
}
],
"lang": "Dutch",
"lang_code": "nl",
"pos": "noun",
"senses": [
{
"categories": [
{
"_dis": "71 29",
"kind": "other",
"name": "Dutch entries with incorrect language header",
"parents": [],
"source": "w+disamb"
},
{
"_dis": "50 50",
"kind": "other",
"name": "Pages with 4 entries",
"parents": [],
"source": "w+disamb"
},
{
"_dis": "50 50",
"kind": "other",
"name": "Pages with entries",
"parents": [],
"source": "w+disamb"
}
],
"form_of": [
{
"word": "corpus"
}
],
"glosses": [
"plural of corpus"
],
"id": "en-corpora-nl-noun-BvqyzxlP",
"links": [
[
"corpus",
"corpus#Dutch"
]
],
"tags": [
"form-of",
"plural"
]
},
{
"categories": [
{
"_dis": "50 50",
"kind": "other",
"name": "Pages with 4 entries",
"parents": [],
"source": "w+disamb"
},
{
"_dis": "50 50",
"kind": "other",
"name": "Pages with entries",
"parents": [],
"source": "w+disamb"
}
],
"form_of": [
{
"word": "corps"
}
],
"glosses": [
"plural of corps"
],
"id": "en-corpora-nl-noun-UdovTeyA",
"links": [
[
"corps",
"corps#Dutch"
]
],
"tags": [
"form-of",
"plural"
]
}
],
"sounds": [
{
"audio": "Nl-corpora.ogg",
"mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/f/fa/Nl-corpora.ogg/Nl-corpora.ogg.mp3",
"ogg_url": "https://upload.wikimedia.org/wikipedia/commons/f/fa/Nl-corpora.ogg"
}
],
"word": "corpora"
}
{
"head_templates": [
{
"args": {
"1": "la",
"2": "noun form"
},
"expansion": "corpora",
"name": "head"
}
],
"lang": "Latin",
"lang_code": "la",
"pos": "noun",
"senses": [
{
"categories": [
{
"kind": "other",
"name": "Latin entries with incorrect language header",
"parents": [],
"source": "w"
},
{
"kind": "other",
"name": "Pages with 4 entries",
"parents": [],
"source": "w"
},
{
"kind": "other",
"name": "Pages with entries",
"parents": [],
"source": "w"
}
],
"form_of": [
{
"word": "corpus"
}
],
"glosses": [
"nominative/accusative/vocative plural of corpus"
],
"id": "en-corpora-la-noun-hOoNCdPP",
"links": [
[
"corpus",
"corpus#Latin"
]
],
"tags": [
"accusative",
"form-of",
"nominative",
"plural",
"vocative"
]
}
],
"word": "corpora"
}
{
"etymology_templates": [
{
"args": {
"1": "pt",
"2": "la",
"3": "corpora"
},
"expansion": "Unadapted borrowing from Latin corpora",
"name": "ubor"
}
],
"etymology_text": "Unadapted borrowing from Latin corpora, plural of corpus.",
"head_templates": [
{
"args": {
"1": "pt",
"2": "noun form",
"head": "corpora"
},
"expansion": "corpora",
"name": "head"
}
],
"hyphenations": [
{
"parts": [
"cor",
"po",
"ra"
]
}
],
"lang": "Portuguese",
"lang_code": "pt",
"pos": "noun",
"senses": [
{
"categories": [
{
"kind": "other",
"name": "Pages with 4 entries",
"parents": [],
"source": "w"
},
{
"kind": "other",
"name": "Pages with entries",
"parents": [],
"source": "w"
},
{
"kind": "other",
"name": "Portuguese entries with incorrect language header",
"parents": [],
"source": "w"
}
],
"form_of": [
{
"word": "corpus"
}
],
"glosses": [
"plural of corpus"
],
"id": "en-corpora-pt-noun-BvqyzxlP",
"links": [
[
"corpus",
"corpus#Portuguese"
]
],
"tags": [
"form-of",
"plural"
]
}
],
"sounds": [
{
"ipa": "/ˈkɔʁ.po.ɾɐ/",
"tags": [
"Brazil"
]
},
{
"ipa": "[ˈkɔh.po.ɾɐ]",
"tags": [
"Brazil"
]
},
{
"ipa": "/ˈkɔʁ.po.ɾɐ/",
"tags": [
"Brazil"
]
},
{
"ipa": "[ˈkɔh.po.ɾɐ]",
"tags": [
"Brazil"
]
},
{
"ipa": "/ˈkɔɾ.po.ɾɐ/",
"tags": [
"São-Paulo"
]
},
{
"ipa": "/ˈkɔʁ.po.ɾɐ/",
"tags": [
"Rio-de-Janeiro"
]
},
{
"ipa": "[ˈkɔχ.po.ɾɐ]",
"tags": [
"Rio-de-Janeiro"
]
},
{
"ipa": "/ˈkɔɻ.po.ɾɐ/",
"tags": [
"Caipira"
]
},
{
"ipa": "/ˈkɔʁ.po.ɾa/",
"tags": [
"Southern-Brazil"
]
},
{
"ipa": "[ˈkɔh.po.ɾa]",
"tags": [
"Southern-Brazil"
]
},
{
"ipa": "/ˈkɔɾ.pu.ɾɐ/",
"tags": [
"Portugal"
]
},
{
"rhymes": "-ɔʁpoɾɐ"
},
{
"rhymes": "-ɔɾpuɾɐ"
}
],
"word": "corpora"
}
{
"categories": [
"Dutch entries with incorrect language header",
"Dutch non-lemma forms",
"Dutch noun forms",
"Pages with 4 entries",
"Pages with entries"
],
"head_templates": [
{
"args": {
"1": "nl",
"2": "noun form"
},
"expansion": "corpora",
"name": "head"
}
],
"lang": "Dutch",
"lang_code": "nl",
"pos": "noun",
"senses": [
{
"form_of": [
{
"word": "corpus"
}
],
"glosses": [
"plural of corpus"
],
"links": [
[
"corpus",
"corpus#Dutch"
]
],
"tags": [
"form-of",
"plural"
]
},
{
"form_of": [
{
"word": "corps"
}
],
"glosses": [
"plural of corps"
],
"links": [
[
"corps",
"corps#Dutch"
]
],
"tags": [
"form-of",
"plural"
]
}
],
"sounds": [
{
"audio": "Nl-corpora.ogg",
"mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/f/fa/Nl-corpora.ogg/Nl-corpora.ogg.mp3",
"ogg_url": "https://upload.wikimedia.org/wikipedia/commons/f/fa/Nl-corpora.ogg"
}
],
"word": "corpora"
}
{
"head_templates": [
{
"args": {
"1": "en",
"2": "noun form"
},
"expansion": "corpora",
"name": "head"
}
],
"lang": "English",
"lang_code": "en",
"pos": "noun",
"senses": [
{
"categories": [
"English entries with incorrect language header",
"English non-lemma forms",
"English noun forms",
"English plurals in -ra with singular in -s",
"Pages with 4 entries",
"Pages with entries"
],
"form_of": [
{
"word": "corpus"
}
],
"glosses": [
"plural of corpus"
],
"links": [
[
"corpus",
"corpus#English"
]
],
"tags": [
"form-of",
"plural"
]
}
],
"sounds": [
{
"ipa": "/ˈkɔːpəɹə/",
"tags": [
"Received-Pronunciation"
]
},
{
"audio": "LL-Q1860 (eng)-Vealhurl-corpora.wav",
"mp3_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/d/dd/LL-Q1860_%28eng%29-Vealhurl-corpora.wav/LL-Q1860_%28eng%29-Vealhurl-corpora.wav.mp3",
"ogg_url": "https://upload.wikimedia.org/wikipedia/commons/transcoded/d/dd/LL-Q1860_%28eng%29-Vealhurl-corpora.wav/LL-Q1860_%28eng%29-Vealhurl-corpora.wav.ogg"
},
{
"ipa": "/ˈkɔɹpəɹə/",
"tags": [
"General-American"
]
}
],
"word": "corpora"
}
{
"head_templates": [
{
"args": {
"1": "la",
"2": "noun form"
},
"expansion": "corpora",
"name": "head"
}
],
"lang": "Latin",
"lang_code": "la",
"pos": "noun",
"senses": [
{
"categories": [
"Latin entries with incorrect language header",
"Latin non-lemma forms",
"Latin noun forms",
"Pages with 4 entries",
"Pages with entries"
],
"form_of": [
{
"word": "corpus"
}
],
"glosses": [
"nominative/accusative/vocative plural of corpus"
],
"links": [
[
"corpus",
"corpus#Latin"
]
],
"tags": [
"accusative",
"form-of",
"nominative",
"plural",
"vocative"
]
}
],
"word": "corpora"
}
{
"etymology_templates": [
{
"args": {
"1": "pt",
"2": "la",
"3": "corpora"
},
"expansion": "Unadapted borrowing from Latin corpora",
"name": "ubor"
}
],
"etymology_text": "Unadapted borrowing from Latin corpora, plural of corpus.",
"head_templates": [
{
"args": {
"1": "pt",
"2": "noun form",
"head": "corpora"
},
"expansion": "corpora",
"name": "head"
}
],
"hyphenations": [
{
"parts": [
"cor",
"po",
"ra"
]
}
],
"lang": "Portuguese",
"lang_code": "pt",
"pos": "noun",
"senses": [
{
"categories": [
"Pages with 4 entries",
"Pages with entries",
"Portuguese 3-syllable words",
"Portuguese entries with incorrect language header",
"Portuguese non-lemma forms",
"Portuguese noun forms",
"Portuguese terms borrowed from Latin",
"Portuguese terms derived from Latin",
"Portuguese terms with IPA pronunciation",
"Portuguese unadapted borrowings from Latin",
"Rhymes:Portuguese/ɔɾpuɾɐ",
"Rhymes:Portuguese/ɔɾpuɾɐ/3 syllables",
"Rhymes:Portuguese/ɔʁpoɾɐ",
"Rhymes:Portuguese/ɔʁpoɾɐ/3 syllables"
],
"form_of": [
{
"word": "corpus"
}
],
"glosses": [
"plural of corpus"
],
"links": [
[
"corpus",
"corpus#Portuguese"
]
],
"tags": [
"form-of",
"plural"
]
}
],
"sounds": [
{
"ipa": "/ˈkɔʁ.po.ɾɐ/",
"tags": [
"Brazil"
]
},
{
"ipa": "[ˈkɔh.po.ɾɐ]",
"tags": [
"Brazil"
]
},
{
"ipa": "/ˈkɔʁ.po.ɾɐ/",
"tags": [
"Brazil"
]
},
{
"ipa": "[ˈkɔh.po.ɾɐ]",
"tags": [
"Brazil"
]
},
{
"ipa": "/ˈkɔɾ.po.ɾɐ/",
"tags": [
"São-Paulo"
]
},
{
"ipa": "/ˈkɔʁ.po.ɾɐ/",
"tags": [
"Rio-de-Janeiro"
]
},
{
"ipa": "[ˈkɔχ.po.ɾɐ]",
"tags": [
"Rio-de-Janeiro"
]
},
{
"ipa": "/ˈkɔɻ.po.ɾɐ/",
"tags": [
"Caipira"
]
},
{
"ipa": "/ˈkɔʁ.po.ɾa/",
"tags": [
"Southern-Brazil"
]
},
{
"ipa": "[ˈkɔh.po.ɾa]",
"tags": [
"Southern-Brazil"
]
},
{
"ipa": "/ˈkɔɾ.pu.ɾɐ/",
"tags": [
"Portugal"
]
},
{
"rhymes": "-ɔʁpoɾɐ"
},
{
"rhymes": "-ɔɾpuɾɐ"
}
],
"word": "corpora"
}
Download raw JSONL data for corpora meaning in All languages combined (4.1kB)
This page is a part of the kaikki.org machine-readable All languages combined dictionary. This dictionary is based on structured data extracted on 2026-03-25 from the enwiktionary dump dated 2026-03-03 using wiktextract (05c257f and 9d9a410). The data shown on this site has been post-processed and various details (e.g., extra categories) removed, some information disambiguated, and additional data merged from other sources. See the raw data download page for the unprocessed wiktextract data.
If you use this data in academic research, please cite Tatu Ylonen: Wiktextract: Wiktionary as Machine-Readable Structured Data, Proceedings of the 13th Conference on Language Resources and Evaluation (LREC), pp. 1317-1325, Marseille, 20-25 June 2022. Linking to the relevant page(s) under https://kaikki.org would also be greatly appreciated.